<!DOCTYPE HTML>
<html lang="en" >
    
    <head>
        
        <meta charset="UTF-8">
        <meta http-equiv="X-UA-Compatible" content="IE=edge" />
        <title>Selenium | 爬虫</title>
        <meta content="text/html; charset=utf-8" http-equiv="Content-Type">
        <meta name="description" content="">
        <meta name="generator" content="GitBook 2.6.7">
        
        
        <meta name="HandheldFriendly" content="true"/>
        <meta name="viewport" content="width=device-width, initial-scale=1, user-scalable=no">
        <meta name="apple-mobile-web-app-capable" content="yes">
        <meta name="apple-mobile-web-app-status-bar-style" content="black">
        <link rel="apple-touch-icon-precomposed" sizes="152x152" href="../gitbook/images/apple-touch-icon-precomposed-152.png">
        <link rel="shortcut icon" href="../gitbook/images/favicon.ico" type="image/x-icon">
        
    <link rel="stylesheet" href="../gitbook/style.css">
    
        
        <link rel="stylesheet" href="../gitbook/plugins/gitbook-plugin-highlight/website.css">
        
    
        
        <link rel="stylesheet" href="../gitbook/plugins/gitbook-plugin-search/search.css">
        
    
        
        <link rel="stylesheet" href="../gitbook/plugins/gitbook-plugin-fontsettings/website.css">
        
    
    

        
    
    
    <link rel="next" href="../进程线程协程/introduce.html" />
    
    
    <link rel="prev" href="../代理/proxy.html" />
    

        
    </head>
    <body>
        
        
    <div class="book"
        data-level="6"
        data-chapter-title="Selenium"
        data-filepath="Selenium/Selenium.md"
        data-basepath=".."
        data-revision="Fri Oct 19 2018 08:44:08 GMT+0800 (中国标准时间)"
        data-innerlanguage="">
    

<div class="book-summary">
    <nav role="navigation">
        <ul class="summary">
            
            
            
            

            

            
    
        <li class="chapter " data-level="0" data-path="index.html">
            
                
                    <a href="../index.html">
                
                        <i class="fa fa-check"></i>
                        
                        序言
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="1" data-path="认识爬虫/introduceSpider.html">
            
                
                    <a href="../认识爬虫/introduceSpider.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>1.</b>
                        
                        认识爬虫
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="1.1" data-path="认识爬虫/http.html">
            
                
                    <a href="../认识爬虫/http.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>1.1.</b>
                        
                        HTTP
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="1.2" data-path="认识爬虫/Requests.html">
            
                
                    <a href="../认识爬虫/Requests.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>1.2.</b>
                        
                        requests
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="1.3" data-path="认识爬虫/初步爬虫.html">
            
                
                    <a href="../认识爬虫/初步爬虫.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>1.3.</b>
                        
                        初步爬虫小项目
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="2" data-path="正则表达式/正则表达式.html">
            
                
                    <a href="../正则表达式/正则表达式.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.</b>
                        
                        正则表达式
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="2.1" data-path="正则表达式/正则表达式练习.html">
            
                
                    <a href="../正则表达式/正则表达式练习.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.1.</b>
                        
                        正则表达式练习
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="2.2" data-path="正则表达式/正则表达式之后的第一个项目.html">
            
                
                    <a href="../正则表达式/正则表达式之后的第一个项目.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.2.</b>
                        
                        正则表达式之后的第一个项目
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="2.3" data-path="正则表达式/正则表达式常用表.html">
            
                
                    <a href="../正则表达式/正则表达式常用表.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.3.</b>
                        
                        正则表达式常用表
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="2.4" data-path="正则表达式/正则表达式重点1.html">
            
                
                    <a href="../正则表达式/正则表达式重点1.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.4.</b>
                        
                        正则表达式重点
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="2.5" data-path="正则表达式/正则表达式常问问题.html">
            
                
                    <a href="../正则表达式/正则表达式常问问题.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.5.</b>
                        
                        正则表达式常问问题
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="2.6" data-path="正则表达式/正则爬虫练习.html">
            
                
                    <a href="../正则表达式/正则爬虫练习.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>2.6.</b>
                        
                        正则爬虫项目练习
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="3" data-path="XPATH/xpath-in.html">
            
                
                    <a href="../XPATH/xpath-in.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>3.</b>
                        
                        XPATH
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="3.1" data-path="XPATH/Xpath.html">
            
                
                    <a href="../XPATH/Xpath.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>3.1.</b>
                        
                        XPATH认识
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="3.2" data-path="XPATH/Xpath的代码例子.html">
            
                
                    <a href="../XPATH/Xpath的代码例子.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>3.2.</b>
                        
                        XPATH的代码例子
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="3.3" data-path="XPATH/xpath的爬虫练习.html">
            
                
                    <a href="../XPATH/xpath的爬虫练习.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>3.3.</b>
                        
                        XPATH的爬虫练习
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="4" data-path="BeautifulSoup/BeautifulSoup.html">
            
                
                    <a href="../BeautifulSoup/BeautifulSoup.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>4.</b>
                        
                        BeautifulSoup
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="4.1" data-path="BeautifulSoup/常用的css选择器.html">
            
                
                    <a href="../BeautifulSoup/常用的css选择器.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>4.1.</b>
                        
                        常用的css选择器
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="4.2" data-path="BeautifulSoup/BeautifulSoup4的各种例子.html">
            
                
                    <a href="../BeautifulSoup/BeautifulSoup4的各种例子.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>4.2.</b>
                        
                        BeautifulSoup4的各种例子
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="5" data-path="代理/proxy.html">
            
                
                    <a href="../代理/proxy.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>5.</b>
                        
                        ip代理池项目
                    </a>
            
            
        </li>
    
        <li class="chapter active" data-level="6" data-path="Selenium/Selenium.html">
            
                
                    <a href="../Selenium/Selenium.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>6.</b>
                        
                        Selenium
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="7" data-path="进程线程协程/introduce.html">
            
                
                    <a href="../进程线程协程/introduce.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.</b>
                        
                        进程线程协程
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="7.1" data-path="进程线程协程/gevent.html">
            
                
                    <a href="../进程线程协程/gevent.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.1.</b>
                        
                        gevent
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="7.2" data-path="进程线程协程/green_let.html">
            
                
                    <a href="../进程线程协程/green_let.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.2.</b>
                        
                        green_let
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="7.3" data-path="进程线程协程/yield.html">
            
                
                    <a href="../进程线程协程/yield.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.3.</b>
                        
                        yield
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="7.4" data-path="进程线程协程/multiprecessing.html">
            
                
                    <a href="../进程线程协程/multiprecessing.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.4.</b>
                        
                        multiprecessing
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="7.5" data-path="进程线程协程/threading.html">
            
                
                    <a href="../进程线程协程/threading.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>7.5.</b>
                        
                        threading
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="8" data-path="scrapy框架/scrapy.html">
            
                
                    <a href="../scrapy框架/scrapy.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>8.</b>
                        
                        Scrapy
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="8.1" data-path="scrapy框架/scrapy_setting.html">
            
                
                    <a href="../scrapy框架/scrapy_setting.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>8.1.</b>
                        
                        scrapy_setting
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="8.2" data-path="scrapy框架/模块作用.html">
            
                
                    <a href="../scrapy框架/模块作用.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>8.2.</b>
                        
                        模块作用
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="8.3" data-path="scrapy框架/19个中间件.html">
            
                
                    <a href="../scrapy框架/19个中间件.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>8.3.</b>
                        
                        19个中间件
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="9" data-path="scrapy-redis分布式/scrapy-redis.html">
            
                
                    <a href="../scrapy-redis分布式/scrapy-redis.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>9.</b>
                        
                        scrapy-redis分布式
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="9.1" data-path="scrapy-redis分布式/scrapy-redis的改造方法.html">
            
                
                    <a href="../scrapy-redis分布式/scrapy-redis的改造方法.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>9.1.</b>
                        
                        scrapy-redis的改造方法
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="10" data-path="spider_projects/introduce.html">
            
                
                    <a href="../spider_projects/introduce.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.</b>
                        
                        spider_projects
                    </a>
            
            
            <ul class="articles">
                
    
        <li class="chapter " data-level="10.1" data-path="spider_projects/使用代理在普通爬虫脚本下.html">
            
                
                    <a href="../spider_projects/使用代理在普通爬虫脚本下.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.1.</b>
                        
                        使用代理在普通爬虫脚本下
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.2" data-path="spider_projects/xpath爬取前程无忧的数据.html">
            
                
                    <a href="../spider_projects/xpath爬取前程无忧的数据.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.2.</b>
                        
                        xpath爬取前程无忧的数据
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.3" data-path="spider_projects/存储数据库的脚本.html">
            
                
                    <a href="../spider_projects/存储数据库的脚本.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.3.</b>
                        
                        存储数据库的脚本
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.4" data-path="spider_projects/weibo.html">
            
                
                    <a href="../spider_projects/weibo.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.4.</b>
                        
                        爬取央视新闻微博
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.5" data-path="spider_projects/weibo2.html">
            
                
                    <a href="../spider_projects/weibo2.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.5.</b>
                        
                        爬取明星的微博
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.6" data-path="spider_projects/liepin.html">
            
                
                    <a href="../spider_projects/liepin.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.6.</b>
                        
                        爬取猎聘的职位信息Crawl
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.7" data-path="spider_projects/zhilianRe.html">
            
                
                    <a href="../spider_projects/zhilianRe.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.7.</b>
                        
                        纯正则爬取智联的职位信息
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.8" data-path="spider_projects/setting.html">
            
                
                    <a href="../spider_projects/setting.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.8.</b>
                        
                        scrapy中的setting
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.9" data-path="spider_projects/items.html">
            
                
                    <a href="../spider_projects/items.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.9.</b>
                        
                        scrapy中的items
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.10" data-path="spider_projects/pipeline.html">
            
                
                    <a href="../spider_projects/pipeline.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.10.</b>
                        
                        scrapy中的pipeline
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.11" data-path="spider_projects/middlewares.html">
            
                
                    <a href="../spider_projects/middlewares.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.11.</b>
                        
                        scrapy中的middlewares
                    </a>
            
            
        </li>
    
        <li class="chapter " data-level="10.12" data-path="spider_projects/框架中的代码运行脚本.html">
            
                
                    <a href="../spider_projects/框架中的代码运行脚本.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>10.12.</b>
                        
                        框架中的代码运行脚本
                    </a>
            
            
        </li>
    

            </ul>
            
        </li>
    
        <li class="chapter " data-level="11" data-path="爬虫的面试题/面试题1-10.html">
            
                
                    <a href="../爬虫的面试题/面试题1-10.html">
                
                        <i class="fa fa-check"></i>
                        
                            <b>11.</b>
                        
                        爬虫面试题
                    </a>
            
            
        </li>
    


            
            <li class="divider"></li>
            <li>
                <a href="https://www.gitbook.com" target="blank" class="gitbook-link">
                    Published with GitBook
                </a>
            </li>
            
        </ul>
    </nav>
</div>

    <div class="book-body">
        <div class="body-inner">
            <div class="book-header" role="navigation">
    <!-- Actions Left -->
    

    <!-- Title -->
    <h1>
        <i class="fa fa-circle-o-notch fa-spin"></i>
        <a href="../" >爬虫</a>
    </h1>
</div>

            <div class="page-wrapper" tabindex="-1" role="main">
                <div class="page-inner">
                
                
                    <section class="normal" id="section-">
                    
                        <h1 id="selenium">Selenium</h1>
<hr>
<p>Selenium&#x662F;&#x4E00;&#x4E2A;Web&#x7684;&#x81EA;&#x52A8;&#x5316;&#x6D4B;&#x8BD5;&#x5DE5;&#x5177;&#xFF0C;&#x6700;&#x521D;&#x662F;&#x4E3A;&#x7F51;&#x7AD9;&#x81EA;&#x52A8;&#x5316;&#x6D4B;&#x8BD5;&#x800C;&#x5F00;&#x53D1;&#x7684;&#xFF0C;&#x7C7B;&#x578B;&#x50CF;&#x6211;&#x4EEC;&#x73A9;&#x6E38;&#x620F;&#x7528;&#x7684;&#x6309;&#x952E;&#x7CBE;&#x7075;&#xFF0C;&#x53EF;&#x4EE5;&#x6309;&#x6307;&#x5B9A;&#x7684;&#x547D;&#x4EE4;&#x81EA;&#x52A8;&#x64CD;&#x4F5C;&#xFF0C;&#x4E0D;&#x540C;&#x662F;Selenium &#x53EF;&#x4EE5;&#x76F4;&#x63A5;&#x8FD0;&#x884C;&#x5728;&#x6D4F;&#x89C8;&#x5668;&#x4E0A;&#xFF0C;&#x5B83;&#x652F;&#x6301;&#x6240;&#x6709;&#x4E3B;&#x6D41;&#x7684;&#x6D4F;&#x89C8;&#x5668;&#xFF08;&#x5305;&#x62EC;PhantomJS&#x8FD9;&#x4E9B;&#x65E0;&#x754C;&#x9762;&#x7684;&#x6D4F;&#x89C8;&#x5668;&#xFF09;&#x3002;</p>
<p>Selenium &#x53EF;&#x4EE5;&#x6839;&#x636E;&#x6211;&#x4EEC;&#x7684;&#x6307;&#x4EE4;&#xFF0C;&#x8BA9;&#x6D4F;&#x89C8;&#x5668;&#x81EA;&#x52A8;&#x52A0;&#x8F7D;&#x9875;&#x9762;&#xFF0C;&#x83B7;&#x53D6;&#x9700;&#x8981;&#x7684;&#x6570;&#x636E;&#xFF0C;&#x751A;&#x81F3;&#x9875;&#x9762;&#x622A;&#x5C4F;&#xFF0C;&#x6216;&#x8005;&#x5224;&#x65AD;&#x7F51;&#x7AD9;&#x4E0A;&#x67D0;&#x4E9B;&#x52A8;&#x4F5C;&#x662F;&#x5426;&#x53D1;&#x751F;&#x3002;</p>
<p>&#x53EF;&#x4EE5;&#x4ECE; PyPI &#x7F51;&#x7AD9;&#x4E0B;&#x8F7D; Selenium&#x5E93;<a href="https://pypi.python.org/simple/selenium" target="_blank">https://pypi.python.org/simple/selenium</a> &#xFF0C;&#x4E5F;&#x53EF;&#x4EE5;&#x7528; &#x7B2C;&#x4E09;&#x65B9;&#x7BA1;&#x7406;&#x5668; pip&#x7528;&#x547D;&#x4EE4;&#x5B89;&#x88C5;&#xFF1A;<code>pip install selenium</code></p>
<p>Selenium &#x5B98;&#x65B9;&#x53C2;&#x8003;&#x6587;&#x6863;&#xFF1A;<a href="http://selenium-python.readthedocs.io/index.html" target="_blank">http://selenium-python.readthedocs.io/index.html</a></p>
<p>chromedriver &#x9A71;&#x52A8;&#x4E0B;&#x8F7D;</p>
<p><a href="https://npm.taobao.org/mirrors/chromedriver/" target="_blank">https://npm.taobao.org/mirrors/chromedriver/</a></p>
<hr>
<p> &#x5F53;&#x9875;&#x9762;&#x4E2D;&#x6709;&#x9700;&#x8981;javascript &#x53BB;&#x52A8;&#x6001;&#x52A0;&#x8F7D;&#x7684;&#x5185;&#x5BB9;&#x7684;&#x65F6;&#x5019;&#xFF0C;
 &#x6211;&#x4EEC;&#x53C8;&#x4E0D;&#x597D;&#x6A21;&#x62DF;&#x8FD9;&#x4E2A;javascript&#xFF0C;&#x8FD9;&#x4E2A;&#x65F6;&#x5019;</p>
<hr>
<h1 id="&#x4F8B;&#x5982;&#xFF1A;&#x767E;&#x5EA6;&#x4E0A;&#x641C;&#x7D22;&#x4EC0;&#x4E48;&#x662F;&#x5EFA;&#x8BBE;&#x6027;&#x95EE;&#x9898;">&#x4F8B;&#x5982;&#xFF1A;&#x767E;&#x5EA6;&#x4E0A;&#x641C;&#x7D22;&#x4EC0;&#x4E48;&#x662F;&#x5EFA;&#x8BBE;&#x6027;&#x95EE;&#x9898;</h1>
<pre><code class="lang-python"><span class="hljs-keyword">from</span> selenium <span class="hljs-keyword">import</span> webdriver

<span class="hljs-comment">#&#x8FD9;&#x4E2A;&#x9A71;&#x52A8;&#x8981;&#x6DFB;&#x52A0;&#x5230;&#x73AF;&#x5883;&#x53D8;&#x91CF;&#x4E2D;&#xFF0C;&#x5982;&#x679C;&#x6CA1;&#x6709;&#x6DFB;&#x52A0;&#x5230;&#x73AF;&#x5883;&#x53D8;&#x91CF;&#x4E2D;&#xFF0C;&#x90A3;&#x4E48;&#x6211;&#x4EEC;&#x53EF;&#x4EE5;&#x4F7F;&#x7528;&#x5B83;&#x7684;&#x8DEF;&#x5F84;&#x3002;</span>
driver = webdriver.Chrome()

driver.get(<span class="hljs-string">&apos;http://www.baidu.com&apos;</span>)

driver.find_element_by_id(<span class="hljs-string">&apos;kw&apos;</span>).send_keys(<span class="hljs-string">&apos;&#x5EFA;&#x8BBE;&#x6027;&#x95EE;&#x9898;&#x662F;&#x4EC0;&#x4E48;&apos;</span>)
driver.find_element_by_id(<span class="hljs-string">&apos;su&apos;</span>).click()
</code></pre>
<hr>
<h1 id="&#x6817;&#x5B50;&#xFF1A;&#x4EAC;&#x4E1C;&#x4E0A;&#x641C;&#x7D22;&#x5976;&#x74F6;&#x6D88;&#x6BD2;&#x5668;">&#x6817;&#x5B50;&#xFF1A;&#x4EAC;&#x4E1C;&#x4E0A;&#x641C;&#x7D22;&#x5976;&#x74F6;&#x6D88;&#x6BD2;&#x5668;</h1>
<pre><code class="lang-python"><span class="hljs-keyword">from</span> selenium <span class="hljs-keyword">import</span> webdriver

driver = webdriver.Chrome()

driver.get(<span class="hljs-string">&apos;https://www.jd.com&apos;</span>)

driver.find_element_by_id(<span class="hljs-string">&apos;key&apos;</span>).send_keys(<span class="hljs-string">&apos;&#x5976;&#x74F6;&#x6D88;&#x6BD2;&#x5668;&apos;</span>)
driver.find_element_by_class_name(<span class="hljs-string">&apos;button&apos;</span>).click()
</code></pre>
<hr>
<p>Selenium &#x81EA;&#x5DF1;&#x4E0D;&#x5E26;&#x6D4F;&#x89C8;&#x5668;&#xFF0C;&#x4E0D;&#x652F;&#x6301;&#x6D4F;&#x89C8;&#x5668;&#x7684;&#x529F;&#x80FD;&#xFF0C;&#x5B83;&#x9700;&#x8981;&#x4E0E;&#x7B2C;&#x4E09;&#x65B9;&#x6D4F;&#x89C8;&#x5668;&#x7ED3;&#x5408;&#x5728;&#x4E00;&#x8D77;&#x624D;&#x80FD;&#x4F7F;&#x7528;&#x3002;&#x4F46;&#x662F;&#x6211;&#x4EEC;&#x6709;&#x65F6;&#x5019;&#x9700;&#x8981;&#x8BA9;&#x5B83;&#x5185;&#x5D4C;&#x5728;&#x4EE3;&#x7801;&#x4E2D;&#x8FD0;&#x884C;&#xFF0C;&#x6240;&#x4EE5;&#x6211;&#x4EEC;&#x53EF;&#x4EE5;&#x7528;&#x4E00;&#x4E2A;&#x53EB; PhantomJS &#x7684;&#x5DE5;&#x5177;&#x4EE3;&#x66FF;&#x771F;&#x5B9E;&#x7684;&#x6D4F;&#x89C8;&#x5668;&#x3002;</p>
<hr>
<h1 id="phantomjs">PhantomJS</h1>
<p>PhantomJS &#x662F;&#x4E00;&#x4E2A;&#x57FA;&#x4E8E;Webkit&#x7684;&#x201C;&#x65E0;&#x754C;&#x9762;&#x201D;(headless)&#x6D4F;&#x89C8;&#x5668;&#xFF0C;&#x5B83;&#x4F1A;&#x628A;&#x7F51;&#x7AD9;&#x52A0;&#x8F7D;&#x5230;&#x5185;&#x5B58;&#x5E76;&#x6267;&#x884C;&#x9875;&#x9762;&#x4E0A;&#x7684; JavaScript&#xFF0C;&#x56E0;&#x4E3A;&#x4E0D;&#x4F1A;&#x5C55;&#x793A;&#x56FE;&#x5F62;&#x754C;&#x9762;&#xFF0C;&#x6240;&#x4EE5;&#x8FD0;&#x884C;&#x8D77;&#x6765;&#x6BD4;&#x5B8C;&#x6574;&#x7684;&#x6D4F;&#x89C8;&#x5668;&#x8981;&#x9AD8;&#x6548;&#x3002;</p>
<p>&#x5982;&#x679C;&#x6211;&#x4EEC;&#x628A; Selenium &#x548C; PhantomJS &#x7ED3;&#x5408;&#x5728;&#x4E00;&#x8D77;&#xFF0C;&#x5C31;&#x53EF;&#x4EE5;&#x8FD0;&#x884C;&#x4E00;&#x4E2A;&#x975E;&#x5E38;&#x5F3A;&#x5927;&#x7684;&#x7F51;&#x7EDC;&#x722C;&#x866B;&#x4E86;&#xFF0C;&#x8FD9;&#x4E2A;&#x722C;&#x866B;&#x53EF;&#x4EE5;&#x5904;&#x7406; JavaScrip&#x3001;Cookie&#x3001;headers&#xFF0C;&#x4EE5;&#x53CA;&#x4EFB;&#x4F55;&#x6211;&#x4EEC;&#x771F;&#x5B9E;&#x7528;&#x6237;&#x9700;&#x8981;&#x505A;&#x7684;&#x4E8B;&#x60C5;&#x3002;</p>
<p>&#x6CE8;&#x610F;&#xFF1A;PhantomJS &#x53EA;&#x80FD;&#x4ECE;&#x5B83;&#x7684;&#x5B98;&#x65B9;&#x7F51;&#x7AD9;<a href="http://phantomjs.org/download.html" target="_blank">http://phantomjs.org/download.html</a>) &#x4E0B;&#x8F7D;&#x3002; &#x56E0;&#x4E3A; PhantomJS &#x662F;&#x4E00;&#x4E2A;&#x529F;&#x80FD;&#x5B8C;&#x5584;(&#x867D;&#x7136;&#x65E0;&#x754C;&#x9762;)&#x7684;&#x6D4F;&#x89C8;&#x5668;&#x800C;&#x975E;&#x4E00;&#x4E2A; Python &#x5E93;&#xFF0C;&#x6240;&#x4EE5;&#x5B83;&#x4E0D;&#x9700;&#x8981;&#x50CF; Python &#x7684;&#x5176;&#x4ED6;&#x5E93;&#x4E00;&#x6837;&#x5B89;&#x88C5;&#xFF0C;&#x4F46;&#x6211;&#x4EEC;&#x53EF;&#x4EE5;&#x901A;&#x8FC7;Selenium&#x8C03;&#x7528;PhantomJS&#x6765;&#x76F4;&#x63A5;&#x4F7F;&#x7528;&#x3002;</p>
<p>PhantomJS &#x5B98;&#x65B9;&#x53C2;&#x8003;&#x6587;&#x6863;&#xFF1A;<a href="http://phantomjs.org/documentation" target="_blank">http://phantomjs.org/documentation</a></p>
<hr>
<h3 id="selenium--phantomjs">selenium + phantomJS</h3>
<h3 id="selenium--chrome-headless-&#x6A21;&#x5F0F;">selenium + Chrome headless &#x6A21;&#x5F0F;</h3>
<p>&#x4F46;&#x662F;&#x73B0;&#x5728;&#x90FD;&#x4E0D;&#x7528;<code>selenium + phantomJS</code>,&#x4E00;&#x822C;&#x4F7F;&#x7528;<code>selenium + Chrome headless &#x6A21;&#x5F0F;</code></p>
<h3 id="&#x6817;&#x5B50;&#xFF1A;&#x722C;&#x53D6;&#x8C46;&#x74E3;&#xFF0C;&#x9700;&#x8981;&#x767B;&#x5F55;&#x9A8C;&#x8BC1;&#x8FDB;&#x5165;&#x540E;&#x722C;&#x53D6;&#x4FE1;&#x606F;&#x3002;">&#x6817;&#x5B50;&#xFF1A;&#x722C;&#x53D6;&#x8C46;&#x74E3;&#xFF0C;&#x9700;&#x8981;&#x767B;&#x5F55;&#x9A8C;&#x8BC1;&#x8FDB;&#x5165;&#x540E;&#x722C;&#x53D6;&#x4FE1;&#x606F;&#x3002;</h3>
<pre><code class="lang-python">
<span class="hljs-comment">#&#x65E0;&#x754C;&#x9762;&#x6A21;&#x5F0F; selenium &#x7684;&#x53E6;&#x4E00;&#x4E2A;&#x6A21;&#x5F0F;</span>
<span class="hljs-keyword">from</span> selenium <span class="hljs-keyword">import</span> webdriver
<span class="hljs-keyword">from</span> lxml <span class="hljs-keyword">import</span> etree
<span class="hljs-keyword">import</span> requests
<span class="hljs-keyword">import</span> base64


option = webdriver.ChromeOptions()
option.add_argument(<span class="hljs-string">&apos;--headless&apos;</span>)
option.add_argument(<span class="hljs-string">&apos;--disable-gpu&apos;</span>)

driver = webdriver.Chrome(chrome_options=option)
driver.get(<span class="hljs-string">&apos;https://accounts.douban.com/login?alias=&amp;redir=https%3A%2F%2Fwww.douban.com%2F&amp;source=index_nav&amp;error=1016&apos;</span>)
driver.find_element_by_id(<span class="hljs-string">&apos;email&apos;</span>).send_keys(<span class="hljs-string">&apos;18510556963&apos;</span>)
driver.find_element_by_id(<span class="hljs-string">&apos;password&apos;</span>).send_keys(<span class="hljs-string">&apos;yaoqinglin2011&apos;</span>)

<span class="hljs-comment">#page_source &#x662F;&#x8FD9;&#x4E2A;&#x9875;&#x9762;&#x7684;html &#x4EE3;&#x7801;</span>
html_str = driver.page_source
html_ele = etree.HTML(html_str)
image_url = html_ele.xpath(<span class="hljs-string">&apos;//img[@id=&quot;captcha_image&quot;]/@src&apos;</span>)[<span class="hljs-number">0</span>]
response = requests.get(image_url)

<span class="hljs-comment"># @&#x83B7;&#x53D6;&#x5230;&#x56FE;&#x7247;&#x7684;base64&#x7684;&#x7F16;&#x7801;</span>
v_pic = base64.b64encode(response.content)
<span class="hljs-comment">#&#x9700;&#x8981;&#x83B7;&#x53D6;&#x6211;&#x4EEC;&#x9A8C;&#x8BC1;&#x7801;&#x7684;&#x7C7B;&#x578B;</span>
v_type = <span class="hljs-string">&apos;cn&apos;</span>

<span class="hljs-comment">#&#x751F;&#x6210;form &#x8868;&#x5355;</span>
form_data = {
    <span class="hljs-string">&apos;v_pic&apos;</span>:v_pic,
    <span class="hljs-string">&apos;v_type&apos;</span>:v_type
}

<span class="hljs-comment">#&#x9700;&#x8981;&#x5728;headers &#x4E2D;&#x589E;&#x52A0;&#x6388;&#x6743;</span>
headers = {
    <span class="hljs-string">&apos;Authorization&apos;</span>: <span class="hljs-string">&apos;APPCODE &apos;</span> + <span class="hljs-string">&apos;eab23fa1d03f40d48b43c826c57bd284&apos;</span>
}
dama_url = <span class="hljs-string">&apos;http://yzmplus.market.alicloudapi.com/fzyzm&apos;</span>
response = requests.post(dama_url,data=form_data,headers=headers)
print(response.text)
res_dict = response.json()
valid_image = res_dict[<span class="hljs-string">&apos;v_code&apos;</span>]
driver.find_element_by_id(<span class="hljs-string">&apos;captcha_field&apos;</span>).send_keys(valid_image)
driver.find_element_by_class_name(<span class="hljs-string">&apos;btn-submit&apos;</span>).click()

cookie_list = []
<span class="hljs-keyword">for</span> cookie <span class="hljs-keyword">in</span> driver.get_cookies():
    cookie_item = cookie[<span class="hljs-string">&apos;name&apos;</span>] + <span class="hljs-string">&apos;=&apos;</span> + cookie[<span class="hljs-string">&apos;value&apos;</span>]
    cookie_list.append(cookie_item)
cookies = <span class="hljs-string">&apos;; &apos;</span>.join(cookie_list)
print(cookies)

url = <span class="hljs-string">&apos;https://www.douban.com/mine/wallet/#/all-spending?page=1&apos;</span>
headers = {
    <span class="hljs-string">&apos;Cookie&apos;</span>: cookies,
    <span class="hljs-string">&apos;User-Agent&apos;</span>: <span class="hljs-string">&apos;Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.92 Safari/537.36&apos;</span>
}
response = requests.get(url,headers=headers)
print(response.status_code)
<span class="hljs-keyword">with</span> open(<span class="hljs-string">&apos;douban_money1.html&apos;</span>,<span class="hljs-string">&apos;wb&apos;</span>) <span class="hljs-keyword">as</span> f:
    f.write(response.content)
</code></pre>
<hr>
<h3 id="&#x5BF9;&#x6BD4;&#xFF1A;&#x4E0B;&#x9762;&#x662F;&#x6709;&#x754C;&#x9762;&#x6A21;&#x5F0F;">&#x5BF9;&#x6BD4;&#xFF1A;&#x4E0B;&#x9762;&#x662F;&#x6709;&#x754C;&#x9762;&#x6A21;&#x5F0F;</h3>
<pre><code class="lang-python">
<span class="hljs-comment">#&#x6709;&#x754C;&#x9762;&#x6A21;&#x5F0F; selenium &#x7684;&#x53E6;&#x4E00;&#x4E2A;&#x6A21;&#x5F0F;</span>
<span class="hljs-keyword">from</span> selenium <span class="hljs-keyword">import</span> webdriver
<span class="hljs-keyword">from</span> lxml <span class="hljs-keyword">import</span> etree
<span class="hljs-keyword">import</span> requests
<span class="hljs-keyword">import</span> base64

<span class="hljs-comment"># selenium + phantomJS</span>
<span class="hljs-comment"># selenium + Chrome headless &#x6A21;&#x5F0F; &#x65E0;&#x754C;&#x9762;&#x6A21;&#x5F0F;</span>

<span class="hljs-comment"># option = webdriver.ChromeOptions()</span>
<span class="hljs-comment"># option.add_argument(&apos;--headless&apos;)</span>
<span class="hljs-comment"># option.add_argument(&apos;--disable-gpu&apos;)</span>

driver = webdriver.Chrome()
driver.get(<span class="hljs-string">&apos;https://accounts.douban.com/login?alias=&amp;redir=https%3A%2F%2Fwww.douban.com%2F&amp;source=index_nav&amp;error=1016&apos;</span>)
driver.find_element_by_id(<span class="hljs-string">&apos;email&apos;</span>).send_keys(<span class="hljs-string">&apos;18510556963&apos;</span>)
driver.find_element_by_id(<span class="hljs-string">&apos;password&apos;</span>).send_keys(<span class="hljs-string">&apos;yaoqinglin2011&apos;</span>)

<span class="hljs-comment">#page_source &#x662F;&#x8FD9;&#x4E2A;&#x9875;&#x9762;&#x7684;html &#x4EE3;&#x7801;</span>
html_str = driver.page_source
html_ele = etree.HTML(html_str)
image_url = html_ele.xpath(<span class="hljs-string">&apos;//img[@id=&quot;captcha_image&quot;]/@src&apos;</span>)[<span class="hljs-number">0</span>]
response = requests.get(image_url)

<span class="hljs-comment"># @&#x83B7;&#x53D6;&#x5230;&#x56FE;&#x7247;&#x7684;base64&#x7684;&#x7F16;&#x7801;</span>
v_pic = base64.b64encode(response.content)
<span class="hljs-comment">#&#x9700;&#x8981;&#x83B7;&#x53D6;&#x6211;&#x4EEC;&#x9A8C;&#x8BC1;&#x7801;&#x7684;&#x7C7B;&#x578B;</span>
v_type = <span class="hljs-string">&apos;cn&apos;</span>

<span class="hljs-comment">#&#x751F;&#x6210;form &#x8868;&#x5355;</span>
form_data = {
    <span class="hljs-string">&apos;v_pic&apos;</span>:v_pic,
    <span class="hljs-string">&apos;v_type&apos;</span>:v_type
}

<span class="hljs-comment">#&#x9700;&#x8981;&#x5728;headers &#x4E2D;&#x589E;&#x52A0;&#x6388;&#x6743;</span>
headers = {
    <span class="hljs-string">&apos;Authorization&apos;</span>: <span class="hljs-string">&apos;APPCODE &apos;</span> + <span class="hljs-string">&apos;eab23fa1d03f40d48b43c826c57bd284&apos;</span>
}

dama_url = <span class="hljs-string">&apos;http://yzmplus.market.alicloudapi.com/fzyzm&apos;</span>

response = requests.post(dama_url,data=form_data,headers=headers)
print(response.text)
res_dict = response.json()
valid_image = res_dict[<span class="hljs-string">&apos;v_code&apos;</span>]
driver.find_element_by_id(<span class="hljs-string">&apos;captcha_field&apos;</span>).send_keys(valid_image)
driver.find_element_by_class_name(<span class="hljs-string">&apos;btn-submit&apos;</span>).click()

cookie_list = []
<span class="hljs-keyword">for</span> cookie <span class="hljs-keyword">in</span> driver.get_cookies():
    cookie_item = cookie[<span class="hljs-string">&apos;name&apos;</span>] + <span class="hljs-string">&apos;=&apos;</span> + cookie[<span class="hljs-string">&apos;value&apos;</span>]
    cookie_list.append(cookie_item)

cookies = <span class="hljs-string">&apos;; &apos;</span>.join(cookie_list)

url = <span class="hljs-string">&apos;https://www.douban.com/mine/wallet/#/all-spending?page=1&apos;</span>
headers = {
    <span class="hljs-string">&apos;Cookie&apos;</span>:cookies,
    <span class="hljs-string">&apos;User-Agent&apos;</span>: <span class="hljs-string">&apos;Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.92 Safari/537.36&apos;</span>
}
response = requests.get(url,headers=headers)

<span class="hljs-keyword">with</span> open(<span class="hljs-string">&apos;douban_money2.html&apos;</span>,<span class="hljs-string">&apos;wb&apos;</span>) <span class="hljs-keyword">as</span> f:
    f.write(response.content)
</code></pre>
<hr>
<h1 id="selenium-&#x7684;&#x7528;&#x5904;">Selenium &#x7684;&#x7528;&#x5904;</h1>
<p>&#x5F53;&#x9875;&#x9762;&#x4E2D;&#x6709;&#x9700;&#x8981;javascript&#x53BB;&#x52A8;&#x6001;&#x52A0;&#x8F7D;&#x7684;&#x5185;&#x5BB9;&#x7684;&#x65F6;&#x5019;&#xFF0C; &#x6211;&#x4EEC;&#x53C8;&#x4E0D;&#x597D;&#x6A21;&#x62DF;&#x8FD9;&#x4E2A;javascript&#xFF0C; &#x90A3;&#x4E48;&#x6211;&#x4EEC;&#x53EF;&#x4EE5;&#x901A;&#x8FC7;selenium&#x8FDB;&#x884C;&#x83B7;&#x53D6;&#x9875;&#x9762;&#x3002;</p>
<ol>
<li><p>&#x5982;&#x679C;&#x9875;&#x9762;&#x9700;&#x8981;&#x52A8;&#x6001;&#x52A0;&#x8F7D;&#x6570;&#x636E;&#xFF0C; &#x8FD9;&#x4E9B;&#x6570;&#x636E;&#x53C8;&#x5305;&#x542B;&#x5728;javascript&#x4E2D;&#xFF0C; &#x6211;&#x4EEC;&#x4E0D;&#x5BB9;&#x6613;&#x83B7;&#x53D6;&#x5230;&#xFF0C;&#x5C31;&#x53EF;&#x4EE5;&#x5E94;&#x7528;selenium&#x8FDB;&#x884C;&#x83B7;&#x53D6;html&#xFF0C; &#x8FD9;&#x4E8B;&#x7684;html&#x662F;&#x5DF2;&#x7ECF;&#x7ECF;&#x8FC7;&#x6D4F;&#x89C8;&#x5668;&#x6E32;&#x67D3;&#x540E;&#x7684;&#x9875;&#x9762;&#x4E86;&#x3002;</p>
</li>
<li><p>&#x5F88;&#x591A;&#x65F6;&#x5019;&#xFF0C;&#x5728;&#x767B;&#x5F55;&#x65F6;&#x9700;&#x8981;&#x6709;&#x52A0;&#x5BC6;&#xFF0C;&#x6240;&#x4EE5;&#x6211;&#x4EEC;&#x53EF;&#x4EE5;&#x901A;&#x8FC7;selenium&#x767B;&#x5F55;&#xFF0C;&#x83B7;&#x53D6;cookie&#xFF0C;&#x8BBE;&#x7F6E;cookie&#x540E;&#x5C31;&#x53EF;&#x4EE5;&#x4EFB;&#x610F;&#x7684;&#x8BBF;&#x95EE;&#x9875;&#x9762;&#x4E86;&#x3002;</p>
</li>
</ol>
<hr>

                    
                    </section>
                
                
                </div>
            </div>
        </div>

        
        <a href="../代理/proxy.html" class="navigation navigation-prev " aria-label="Previous page: ip代理池项目"><i class="fa fa-angle-left"></i></a>
        
        
        <a href="../进程线程协程/introduce.html" class="navigation navigation-next " aria-label="Next page: 进程线程协程"><i class="fa fa-angle-right"></i></a>
        
    </div>
</div>

        
<script src="../gitbook/app.js"></script>

    
    <script src="../gitbook/plugins/gitbook-plugin-search/lunr.min.js"></script>
    

    
    <script src="../gitbook/plugins/gitbook-plugin-search/search.js"></script>
    

    
    <script src="../gitbook/plugins/gitbook-plugin-sharing/buttons.js"></script>
    

    
    <script src="../gitbook/plugins/gitbook-plugin-fontsettings/buttons.js"></script>
    

<script>
require(["gitbook"], function(gitbook) {
    var config = {"highlight":{},"search":{"maxIndexSize":1000000},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"fontsettings":{"theme":"white","family":"sans","size":2}};
    gitbook.start(config);
});
</script>

        
    </body>
    
</html>
